In [2]:
import pylab as plt
%matplotlib inline

def read_tab_only(inputfile):
    
    f=open(inputfile,'r').read().split('\n')

    time=[]
    pitch=[]
    for i in range(1,len(f)):
        line=f[i]
        if line!="":
            split=line.split('\t')
            #print split
            time.append(float(split[0]))
            pitch.append(float(split[1]))
    
    #plt.plot(pitch,'gx')
    return time,pitch
In [3]:
#'pitch/pitcCHJ000001.tab','procd_pitch_newtrim/CHJ000001_proc.tab'
def plot_one_file(pitch_file,procd_file):
    
    time,pitch=read_tab_only(pitch_file)
    ntime,npitch=read_tab_only(procd_file)
    plt.figure()
    plt.plot(time,pitch,'x')
    plt.plot(ntime,npitch,'ro')
    plt.title(procd_file)
In [ ]:
 
In [ ]:
 
In [ ]:
 

version: without unvoiced trimming, T=130 if filter_std < 60 else 200

In [ ]:
 
In [ ]:
 
In [5]:
import random
from os import listdir
pitch_path = 'pitch'
procd_path = 'procd_pitch_newtrim'
onlyfiles = [ f for f in listdir(procd_path) if f.endswith(".tab")]
#print onlyfiles
SEED=249
random.seed(SEED)
sampled_files=random.sample(onlyfiles,50)
print sampled_files
for file_name in sampled_files:
    core_name = file_name.split('_')[0]
    pitch_file = pitch_path + "/" + 'pitc' + core_name + '.tab'
    procd_file = procd_path + '/' + file_name
    plot_one_file(pitch_file, procd_file)
['FAJ000521_proc.tab', 'XIN000254_proc.tab', 'FAJ000608_proc.tab', 'SUC000450_proc.tab', 'WAJ000136_proc.tab', 'WAJ000249_proc.tab', 'RUO000389_proc.tab', 'XIN000597_proc.tab', 'DOH000269_proc.tab', 'XIH100315_proc.tab', 'SHH000024_proc.tab', 'XIH100437_proc.tab', 'KOF000122_proc.tab', 'DIL000160_proc.tab', 'WAJ000644_proc.tab', 'OUT000159_proc.tab', 'XIJ000268_proc.tab', 'DOH000127_proc.tab', 'KOF000034_proc.tab', 'XUL001023_proc.tab', 'KOF000146_proc.tab', 'DOH000882_proc.tab', 'OUT000109_proc.tab', 'XIY000215_proc.tab', 'CHX000286_proc.tab', 'SHH000497_proc.tab', 'WAJ000390_proc.tab', 'XIH100407_proc.tab', 'WAJ000043_proc.tab', 'CHX000191_proc.tab', 'DIL000393_proc.tab', 'RUO000278_proc.tab', 'CHX000104_proc.tab', 'MAK000144_proc.tab', 'DOH001566_proc.tab', 'TIK000046_proc.tab', 'CHX000078_proc.tab', 'OUT000014_proc.tab', 'WAJ000090_proc.tab', 'SHH000312_proc.tab', 'DOH000586_proc.tab', 'WAJ001455_proc.tab', 'FAJ001299_proc.tab', 'FAJ000479_proc.tab', 'XIJ000257_proc.tab', 'SHH000369_proc.tab', 'DOH001376_proc.tab', 'DIL000266_proc.tab', 'DOH000919_proc.tab', 'WAJ001734_proc.tab']
In [ ]:
 

version: with unvoiced trimming, T=130 if filter_std < 60 else 200

In [ ]:
 
In [ ]:
 
In [ ]:
 
In [6]:
import random
from os import listdir
pitch_path = 'pitch'
procd_path = 'procd_pitch_newtrim_sec'
onlyfiles = [ f for f in listdir(procd_path) if f.endswith(".tab")]
#print onlyfiles
SEED=249
random.seed(SEED)
sampled_files=random.sample(onlyfiles,50)
print sampled_files
for file_name in sampled_files:
    core_name = file_name.split('_')[0]
    pitch_file = pitch_path + "/" + 'pitc' + core_name + '.tab'
    procd_file = procd_path + '/' + file_name
    plot_one_file(pitch_file, procd_file)
['FAJ000521_proc.tab', 'XIN000254_proc.tab', 'FAJ000608_proc.tab', 'SUC000450_proc.tab', 'WAJ000136_proc.tab', 'WAJ000249_proc.tab', 'RUO000389_proc.tab', 'XIN000597_proc.tab', 'DOH000269_proc.tab', 'XIH100315_proc.tab', 'SHH000024_proc.tab', 'XIH100437_proc.tab', 'KOF000122_proc.tab', 'DIL000160_proc.tab', 'WAJ000644_proc.tab', 'OUT000159_proc.tab', 'XIJ000268_proc.tab', 'DOH000127_proc.tab', 'KOF000034_proc.tab', 'XUL001023_proc.tab', 'KOF000146_proc.tab', 'DOH000882_proc.tab', 'OUT000109_proc.tab', 'XIY000215_proc.tab', 'CHX000286_proc.tab', 'SHH000497_proc.tab', 'WAJ000390_proc.tab', 'XIH100407_proc.tab', 'WAJ000043_proc.tab', 'CHX000191_proc.tab', 'DIL000393_proc.tab', 'RUO000278_proc.tab', 'CHX000104_proc.tab', 'MAK000144_proc.tab', 'DOH001566_proc.tab', 'TIK000046_proc.tab', 'CHX000078_proc.tab', 'OUT000014_proc.tab', 'WAJ000090_proc.tab', 'SHH000312_proc.tab', 'DOH000586_proc.tab', 'WAJ001455_proc.tab', 'FAJ001299_proc.tab', 'FAJ000479_proc.tab', 'XIJ000257_proc.tab', 'SHH000369_proc.tab', 'DOH001376_proc.tab', 'DIL000266_proc.tab', 'DOH000919_proc.tab', 'WAJ001734_proc.tab']

with unvoiced trimming, T=130 if fil_std < 70 else 200

In [ ]:
 
In [ ]:
 
In [7]:
import random
from os import listdir
pitch_path = 'pitch'
procd_path = 'procd_pitch_newtrim_sec_2'
onlyfiles = [ f for f in listdir(procd_path) if f.endswith(".tab")]
#print onlyfiles
SEED=249
random.seed(SEED)
sampled_files=random.sample(onlyfiles,50)
print sampled_files
for file_name in sampled_files:
    core_name = file_name.split('_')[0]
    pitch_file = pitch_path + "/" + 'pitc' + core_name + '.tab'
    procd_file = procd_path + '/' + file_name
    plot_one_file(pitch_file, procd_file)
['FAJ000521_proc.tab', 'XIN000254_proc.tab', 'FAJ000608_proc.tab', 'SUC000450_proc.tab', 'WAJ000136_proc.tab', 'WAJ000249_proc.tab', 'RUO000389_proc.tab', 'XIN000597_proc.tab', 'DOH000269_proc.tab', 'XIH100315_proc.tab', 'SHH000024_proc.tab', 'XIH100437_proc.tab', 'KOF000122_proc.tab', 'DIL000160_proc.tab', 'WAJ000644_proc.tab', 'OUT000159_proc.tab', 'XIJ000268_proc.tab', 'DOH000127_proc.tab', 'KOF000034_proc.tab', 'XUL001023_proc.tab', 'KOF000146_proc.tab', 'DOH000882_proc.tab', 'OUT000109_proc.tab', 'XIY000215_proc.tab', 'CHX000286_proc.tab', 'SHH000497_proc.tab', 'WAJ000390_proc.tab', 'XIH100407_proc.tab', 'WAJ000043_proc.tab', 'CHX000191_proc.tab', 'DIL000393_proc.tab', 'RUO000278_proc.tab', 'CHX000104_proc.tab', 'MAK000144_proc.tab', 'DOH001566_proc.tab', 'TIK000046_proc.tab', 'CHX000078_proc.tab', 'OUT000014_proc.tab', 'WAJ000090_proc.tab', 'SHH000312_proc.tab', 'DOH000586_proc.tab', 'WAJ001455_proc.tab', 'FAJ001299_proc.tab', 'FAJ000479_proc.tab', 'XIJ000257_proc.tab', 'SHH000369_proc.tab', 'DOH001376_proc.tab', 'DIL000266_proc.tab', 'DOH000919_proc.tab', 'WAJ001734_proc.tab']

same as above except filtered out short segments(len < 50) and shorter segments (len < 100) who also starts with high d1

In [9]:
import random
from os import listdir
pitch_path = 'pitch'
procd_path = 'procd_pitch_newtrim_sec_3'
onlyfiles = [ f for f in listdir(procd_path) if f.endswith(".tab")]
#print onlyfiles
SEED=249
random.seed(SEED)
sampled_files=random.sample(onlyfiles,50)
print sampled_files
for file_name in sampled_files:
    core_name = file_name.split('_')[0]
    pitch_file = pitch_path + "/" + 'pitc' + core_name + '.tab'
    procd_file = procd_path + '/' + file_name
    plot_one_file(pitch_file, procd_file)
['FAJ000521_proc.tab', 'XIN000254_proc.tab', 'FAJ000608_proc.tab', 'SUC000450_proc.tab', 'WAJ000136_proc.tab', 'WAJ000249_proc.tab', 'RUO000389_proc.tab', 'XIN000597_proc.tab', 'DOH000269_proc.tab', 'XIH100315_proc.tab', 'SHH000024_proc.tab', 'XIH100437_proc.tab', 'KOF000122_proc.tab', 'DIL000160_proc.tab', 'WAJ000644_proc.tab', 'OUT000159_proc.tab', 'XIJ000268_proc.tab', 'DOH000127_proc.tab', 'KOF000034_proc.tab', 'XUL001023_proc.tab', 'KOF000146_proc.tab', 'DOH000882_proc.tab', 'OUT000109_proc.tab', 'XIY000215_proc.tab', 'CHX000286_proc.tab', 'SHH000497_proc.tab', 'WAJ000390_proc.tab', 'XIH100407_proc.tab', 'WAJ000043_proc.tab', 'CHX000191_proc.tab', 'DIL000393_proc.tab', 'RUO000278_proc.tab', 'CHX000104_proc.tab', 'MAK000144_proc.tab', 'DOH001566_proc.tab', 'TIK000046_proc.tab', 'CHX000078_proc.tab', 'OUT000014_proc.tab', 'WAJ000090_proc.tab', 'SHH000312_proc.tab', 'DOH000586_proc.tab', 'WAJ001455_proc.tab', 'FAJ001299_proc.tab', 'FAJ000479_proc.tab', 'XIJ000257_proc.tab', 'SHH000369_proc.tab', 'DOH001376_proc.tab', 'DIL000266_proc.tab', 'DOH000919_proc.tab', 'WAJ001734_proc.tab']
In [ ]:
 
In [ ]:
 

plotting some individual cases

In [ ]:
 
In [16]:
plot_one_file('pitch/pitcXIH000164.tab','procd_pitch_newtrim/XIH000164_proc.tab')
In [ ]:
 
In [ ]:
 
In [ ]:
 
In [ ]:
 
In [ ]:
 
In [ ]:
 
In [ ]:
 
In [ ]: